Text Data Exploration

In [1]:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
import requests
import json
import chart_studio.plotly as py
import plotly.express as px
import plotly.figure_factory as ff

Retrieve Text Data From Firebase

In [2]:
test_url = 'https://finalproject-42236-default-rtdb.firebaseio.com/test.json'
response = requests.get(test_url)
text_test = response.json()
test_t = pd.DataFrame.from_dict(text_test, orient='columns')
In [3]:
train_url = 'https://finalproject-42236-default-rtdb.firebaseio.com/train.json'
response = requests.get(train_url)
text_train = response.json()
train_t = pd.DataFrame.from_dict(text_train, orient='columns')

Interactive Data Visulization

Data Distribution

For training data

In [4]:
for col in train_t.columns:
    fig = px.histogram(train_t, x=col)
    fig.show()

For testing data

In [5]:
for col in test_t.columns:
    fig = px.histogram(test_t, x=col)
    fig.show()

Box Plot

For training data

In [6]:
for col in train_t.columns:
    if col == "Group": continue
    fig = px.box(train_t, x="Group", y=col)
    fig.show()

For testing data

In [7]:
for col in test_t.columns:
    if col == "Group": continue
    fig = px.box(test_t, x="Group", y=col)
    fig.show()
In [ ]: